<!DOCTYPE html>
<html xmlns="http://www.w3.org/1999/xhtml">
  <head>

    <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
    <meta content="Cask Data, Inc." name="author" />
<meta content="Copyright © 2015-2017 Cask Data, Inc." name="copyright" />


    <meta name="git_release" content="6.1.1">
    <meta name="git_hash" content="05fbac36f9f7aadeb44f5728cea35136dbc243e5">
    <meta name="git_timestamp" content="2020-02-09 08:22:47 +0800">
    <title>Pentaho Data Integration</title>

    <link rel="stylesheet" href="_static/cdap-bootstrap.css" type="text/css" />
    <link rel="stylesheet" href="_static/pygments.css" type="text/css" />
    <link rel="stylesheet" href="_static/bootstrap-3.3.6/css/bootstrap.min.css" type="text/css" />
    <link rel="stylesheet" href="_static/bootstrap-3.3.6/css/bootstrap-theme.min.css" type="text/css" />
    <link rel="stylesheet" href="_static/css/bootstrap-sphinx.css" type="text/css" />
    <link rel="stylesheet" href="_static/css/cdap-dynamicscrollspy-4.css" type="text/css" />
    <link rel="stylesheet" href="_static/css/jquery.mCustomScrollbar.css" type="text/css" />
    <link rel="stylesheet" href="_static/css/cdap-jquery.mCustomScrollbar.css" type="text/css" />
    <link rel="stylesheet" href="_static/css/abixTreeList-2.css" type="text/css" />
    <link rel="stylesheet" href="_static/cdap-bootstrap.css" type="text/css" />

    <script type="text/javascript">
      var DOCUMENTATION_OPTIONS = {
        URL_ROOT:    '',
        VERSION:     '6.1.1',
        COLLAPSE_INDEX: false,
        FILE_SUFFIX: '.html',
        HAS_SOURCE:  false
      };
    </script>
    <script type="text/javascript" src="_static/jquery.js"></script>
    <script type="text/javascript" src="_static/underscore.js"></script>
    <script type="text/javascript" src="_static/doctools.js"></script>
    <script type="text/javascript" src="_static/language_data.js"></script>

    <link rel="shortcut icon" href="_static/favicon.ico"/>
    <link rel="index" title="Index" href="genindex.html" />
    <link rel="search" title="Search" href="search.html" />
    <link rel="top" title="Cask Data Application Platform 6.1.1 Documentation" href="index.html" />
    <link rel="next" title="SquirrelSQL" href="squirrel.html" />
    <link rel="prev" title="CDAP ODBC Driver" href="odbc.html" />
    <!-- block extrahead -->
    <meta charset='utf-8'>
    <meta http-equiv='X-UA-Compatible' content='IE=edge,chrome=1'>
    <meta name='viewport' content='width=device-width, initial-scale=1.0, maximum-scale=1'>
    <meta name="apple-mobile-web-app-capable" content="yes">
    <!-- block extrahead end -->

</head>
<body role="document">

<!-- block navbar -->
<div id="navbar" class="navbar navbar-inverse navbar-default navbar-fixed-top">
    <div class="container-fluid">
      <div class="row">
        <div class="navbar-header">
          <!-- .btn-navbar is used as the toggle for collapsed navbar content -->
          <a class="navbar-brand" href="table-of-contents/../../index.html">
            <span><img alt="CDAP logo" src="_static/cdap_logo.svg"/></span>
          </a>

          <button type="button" class="navbar-toggle" data-toggle="collapse" data-target=".nav-collapse">
            <span class="icon-bar"></span>
            <span class="icon-bar"></span>
            <span class="icon-bar"></span>
          </button>

          <div class="pull-right">
            <div class="dropdown version-dropdown">
              <a href="#" class="dropdown-toggle" data-toggle="dropdown"
                role="button" aria-haspopup="true" aria-expanded="false">
                v 6.1.1 <span class="caret"></span>
              </a>
              <ul class="dropdown-menu">
                <li><a href="//docs.cdap.io/cdap/5.1.2/en/index.html">v 5.1.2</a></li>
                <li><a href="//docs.cdap.io/cdap/4.3.4/en/index.html">v 4.3.4</a></li>
              </ul>
            </div>
          </div>
          <form class="navbar-form navbar-right navbar-search" action="search.html" method="get">
            <div class="form-group">
              <div class="navbar-search-image material-icons"></div>
              <input type="text" name="q" class="form-control" placeholder="  Search" />
            </div>
            <input type="hidden" name="check_keywords" value="yes" />
            <input type="hidden" name="area" value="default" />
          </form>

          <div class="collapse navbar-collapse nav-collapse navbar-right navbar-navigation">
            <ul class="nav navbar-nav"><li class="docsite-nav-tab-container"><a class="docsite-nav-tab-link " href="table-of-contents/../../index.html">简介</a></li><li class="docsite-nav-tab-container"><a class="docsite-nav-tab-link current" href="table-of-contents/../../guides.html">手册</a></li><li class="docsite-nav-tab-container"><a class="docsite-nav-tab-link " href="table-of-contents/../../reference-manual/index.html">参考</a></li><li class="docsite-nav-tab-container"><a class="docsite-nav-tab-link " href="table-of-contents/../../faqs/index.html">帮助</a></li>
            </ul>
          </div>

        </div>
      </div>
    </div>
  </div><!-- block navbar end -->
<!-- block main content -->
<div class="main-container container">
  <div class="row"><div class="col-md-2">
      <div id="sidebar" class="bs-sidenav scrollable-y-outside" role="complementary">
<!-- theme_manual: integrations -->
<!-- theme_manual_highlight: guides -->
<!-- sidebar_title_link: table-of-contents/../../guides.html -->

  <div role="note" aria-label="manuals links"><h3><a href="table-of-contents/../../guides.html">Guides</a></h3>

    <ul class="this-page-menu">
      <li class="toctree-l1"><a href="table-of-contents/../../user-guide/index.html" rel="nofollow">用户手册</a>
      </li>
      <li class="toctree-l1"><a href="table-of-contents/../../developer-manual/index.html" rel="nofollow">开发手册</a>
      </li>
      <li class="toctree-l1"><a href="table-of-contents/../../admin-manual/index.html" rel="nofollow">管理手册</a>
      </li>
      <li class="toctree-l1"><b><a href="table-of-contents/../../integrations/index.html" rel="nofollow">集成手册</a></b>
      <nav class="pagenav">
      <ul class="current">
<li class="toctree-l1"><a class="reference internal" href="index.html"> Introduction</a></li>
<li class="toctree-l1"><a class="reference internal" href="hub.html"> Hub</a></li>
<li class="toctree-l1"><a class="reference internal" href="partners/cloudera/index.html"> Cloudera</a><ul>
<li class="toctree-l2"><a class="reference internal" href="partners/cloudera/ingesting.html"> Ingestion and Exploration</a></li>
</ul>
</li>
<li class="toctree-l1"><a class="reference internal" href="apache-sentry.html"> Apache Sentry</a></li>
<li class="toctree-l1"><a class="reference internal" href="apache-ranger.html"> Apache Ranger</a></li>
<li class="toctree-l1"><a class="reference internal" href="hadoop-kms.html"> Apache Hadoop KMS</a></li>
<li class="toctree-l1"><a class="reference internal" href="jdbc.html"> CDAP JDBC Driver</a></li>
<li class="toctree-l1"><a class="reference internal" href="odbc.html"> CDAP ODBC Driver</a></li>
<li class="toctree-l1 current"><a class="current reference internal" href="#"> Pentaho Data Integration</a></li>
<li class="toctree-l1"><a class="reference internal" href="squirrel.html"> SquirrelSQL</a></li>
</ul>
</nav>
      </li>
      <li class="toctree-l1"><a href="table-of-contents/../../examples-manual/index.html" rel="nofollow">最佳实践</a>
      </li>
    </ul>
  </div></div>
    </div><div class="col-md-8 content" id="main-content">
    
  <div class="section" id="pentaho-data-integration">
<span id="pentaho-integration"></span><h1>Pentaho Data Integration<a class="headerlink" href="#pentaho-data-integration" title="Permalink to this headline">🔗</a></h1>
<p><em>Pentaho Data Integration</em> is an advanced, open source business intelligence tool that can execute
transformations of data coming from various sources. Let’s see how to connect it to
CDAP datasets using the <a class="reference internal" href="jdbc.html#cdap-jdbc"><span class="std std-ref">CDAP JDBC driver</span></a>.</p>
<ol class="arabic">
<li><p class="first">Before opening the <em>Pentaho Data Integration</em> application, copy the
<code class="docutils literal notranslate"><span class="pre">io.cdap.cdap.cdap-explore-jdbc-</span></code><code class="docutils literal notranslate"><span class="pre">6.1.1</span></code><code class="docutils literal notranslate"><span class="pre">.jar</span></code>
file to the <code class="docutils literal notranslate"><span class="pre">lib</span></code> directory of <em>Pentaho Data Integration</em>, located at the root of the application’s directory.</p>
</li>
<li><p class="first">Open <em>Pentaho Data Integration</em>.</p>
</li>
<li><p class="first">In the toolbar, select <code class="docutils literal notranslate"><span class="pre">File</span> <span class="pre">-&gt;</span> <span class="pre">New</span> <span class="pre">-&gt;</span> <span class="pre">Database</span> <span class="pre">Connection...</span></code>.</p>
</li>
<li><p class="first">In the <code class="docutils literal notranslate"><span class="pre">General</span></code> section, select a <code class="docutils literal notranslate"><span class="pre">Connection</span> <span class="pre">Name</span></code>, such as <code class="docutils literal notranslate"><span class="pre">CDAP</span> <span class="pre">Sandbox</span></code>. For the <code class="docutils literal notranslate"><span class="pre">Connection</span> <span class="pre">Type</span></code>, select
<code class="docutils literal notranslate"><span class="pre">Generic</span> <span class="pre">database</span></code>. Select <code class="docutils literal notranslate"><span class="pre">Native</span> <span class="pre">(JDBC)</span></code> for the <code class="docutils literal notranslate"><span class="pre">Access</span></code> field. In this example, where we connect to
a CDAP Sandbox, our <code class="docutils literal notranslate"><span class="pre">Custom</span> <span class="pre">Connection</span> <span class="pre">URL</span></code> will then be <code class="docutils literal notranslate"><span class="pre">jdbc:cdap://localhost:11015</span></code>.
In the field <code class="docutils literal notranslate"><span class="pre">Custom</span> <span class="pre">Driver</span> <span class="pre">Class</span> <span class="pre">Name</span></code>, enter <code class="docutils literal notranslate"><span class="pre">io.cdap.cdap.explore.jdbc.ExploreDriver</span></code>.</p>
<a class="reference internal image-reference" href="_images/pentaho_add_connection.png"><img alt="_images/pentaho_add_connection.png" src="_images/pentaho_add_connection.png" style="width: 6in;" /></a>
</li>
<li><p class="first">Click on <code class="docutils literal notranslate"><span class="pre">OK</span></code>.</p>
</li>
<li><p class="first">To use this connection, navigate to the <code class="docutils literal notranslate"><span class="pre">Design</span></code> tab on the left of the main view. In the <code class="docutils literal notranslate"><span class="pre">Input</span></code> menu,
double click on <code class="docutils literal notranslate"><span class="pre">Table</span> <span class="pre">input</span></code>. It will create a new transformation containing this input.</p>
<a class="reference internal image-reference" href="_images/pentaho_table_input.png"><img alt="_images/pentaho_table_input.png" src="_images/pentaho_table_input.png" style="width: 6in;" /></a>
</li>
<li><p class="first">Right-click on <code class="docutils literal notranslate"><span class="pre">Table</span> <span class="pre">input</span></code> in your transformation and select <code class="docutils literal notranslate"><span class="pre">Edit</span> <span class="pre">step</span></code>. You can specify an appropriate name
for this input such as <code class="docutils literal notranslate"><span class="pre">CDAP</span> <span class="pre">datasets</span> <span class="pre">query</span></code>. Under <code class="docutils literal notranslate"><span class="pre">Connection</span></code>, select the newly created database connection;
in this example, <code class="docutils literal notranslate"><span class="pre">CDAP</span> <span class="pre">Sandbox</span></code>. Enter a valid SQL query in the main <code class="docutils literal notranslate"><span class="pre">SQL</span></code> field. This will define the data
available to your transformation.</p>
<a class="reference internal image-reference" href="_images/pentaho_modify_input.png"><img alt="_images/pentaho_modify_input.png" src="_images/pentaho_modify_input.png" style="width: 6in;" /></a>
</li>
<li><p class="first">Click on <code class="docutils literal notranslate"><span class="pre">OK</span></code>. Your input is now ready to be used in your transformation, and it will contain data coming
from the results of the SQL query on the CDAP datasets.</p>
</li>
<li><p class="first">For more information on how to add components to a transformation and link them together, see the
<a class="reference external" href="http://community.pentaho.com/projects/data-integration/">Pentaho Data Integration page</a>.</p>
</li>
</ol>
</div>

</div>
    <div class="col-md-2">
      <div id="right-sidebar" class="bs-sidenav scrollable-y" role="complementary">
        <div id="localtoc-scrollspy">
        </div>
      </div>
    </div></div>
</div>
<!-- block main content end -->
<!-- block footer -->
<footer class="footer">
      <div class="container">
        <div class="row">
          <div class="col-md-2 footer-left"><a title="CDAP ODBC Driver" href="odbc.html" />Previous</a></div>
          <div class="col-md-8 footer-center"><a class="footer-tab-link" href="table-of-contents/../../reference-manual/licenses/index.html">Copyright</a> &copy; 2014-2020 Cask Data, Inc.&bull; <a class="footer-tab-link" href="//docs.cask.co/cdap/6.1.1/cdap-docs-6.1.1-web.zip" rel="nofollow">Download</a> an archive or
<a class="footer-tab-link" href="//docs.cask.co/cdap">switch the version</a> of the documentation
          </div>
          <div class="col-md-2 footer-right"><a title="SquirrelSQL" href="squirrel.html" />Next</a></div>
        </div>
      </div>
    </footer>
<!-- block footer end -->
<script type="text/javascript" src="_static/bootstrap-3.3.6/js/bootstrap.min.js"></script><script type="text/javascript" src="_static/js/bootstrap-sphinx.js"></script><script type="text/javascript" src="_static/js/abixTreeList-2.js"></script><script type="text/javascript" src="_static/js/cdap-dynamicscrollspy-4.js"></script><script type="text/javascript" src="_static/js/cdap-version-menu.js"></script><script type="text/javascript" src="_static/js/copy-to-clipboard.js"></script><script type="text/javascript" src="_static/js/jquery.mousewheel.min.js"></script><script type="text/javascript" src="_static/js/jquery.mCustomScrollbar.js"></script><script type="text/javascript" src="_static/js/js.cookie.js"></script><script type="text/javascript" src="_static/js/tabbed-parsed-literal-0.2.js"></script><script type="text/javascript" src="_static/js/cdap-onload-javascript.js"></script><script type="text/javascript" src="_static/js/cdap-version-menu.js"></script>
    <script src="https://cdap.gitee.io/docs/cdap/json-versions.js"/></script>
  </body>
</html>